class TrainConstants:
    """训练相关常量"""
    DEFAULT_BUFFER_SIZE = 1000
    DEFAULT_WIN_RATES_SIZE = 100
    MAX_RECENT_COMPARISONS = 5
    MAX_THREAT_EPISODES = 1000
    DEFAULT_AVG_STEPS_PER_EPISODE = 50
    INVALID_ACTION = -1
    AI_PLAYER = 1
    OPPONENT_PLAYER = -1